@article{entry_article_one,
  author = {Alice Smith and Bob Johnson},
  title = {Exploring Article Formats},
  journal = {Journal of Examples},
  year = {2012},
  volume = {42},
  number = {3},
  pages = {101-120}
}

@book{entry_book_foundations,
  author = {Carla Ruiz and Deepak Patel},
  title = {Foundations of Structured Documents},
  publisher = {Example Press},
  year = {2010},
  address = {Berlin}
}

@inproceedings{entry_inproceedings_parallel,
  author = {Ethan Lee and Fatima Khan},
  title = {Parallel Parsing Techniques},
  booktitle = {Proceedings of the Structured Data Conference},
  year = {2019},
  pages = {55-68}
}

@phdthesis{entry_phdthesis_semantics,
  author = {Grace Muller},
  title = {Semantics Aware Document Pipelines},
  school = {University of Hamburg},
  year = {2015}
}

@mastersthesis{entry_mastersthesis_design,
  author = {Hugo Silva},
  title = {Designing Resilient Extraction Systems},
  school = {Technical University of Lisbon},
  year = {2018}
}

@techreport{entry_techreport_scalability,
  author = {Ingrid Novak},
  title = {Scalability Benchmarks for Extraction Engines},
  institution = {Alpine Research Labs},
  number = {ARL-TR-011},
  year = {2011}
}

@manual{entry_manual_reference,
  author = {Javier Torres},
  title = {Kreuzberg Reference Manual},
  organization = {Kreuzberg Labs},
  year = {2005}
}

@misc{entry_misc_dataset,
  author = {Keiko Tanaka},
  title = {Annotated Extraction Dataset},
  year = {2022},
  howpublished = {Dataset Repository},
  note = {Version 3.2}
}

@unpublished{entry_unpublished_notes,
  author = {Liam O'Connor},
  title = {Notes on Incremental Extraction},
  note = {Draft manuscript},
  year = {2021}
}

@incollection{entry_incollection_story,
  author = {Mei Huang},
  title = {Story Driven Testing},
  booktitle = {Modern Document Pipelines},
  publisher = {Insight Publishing},
  year = {2016},
  chapter = {4}
}

@inbook{entry_inbook_chapter,
  author = {Noah Becker},
  title = {Advanced Pipeline Patterns},
  chapter = {11},
  publisher = {TechWorks},
  year = {2009}
}

@proceedings{entry_proceedings_ai,
  title = {Proceedings of the AI Extraction Summit},
  year = {2017},
  editor = {Olivia Rossi}
}

@booklet{entry_booklet_summary,
  author = {Priya Desai},
  title = {Summary of Extraction Benchmarks},
  year = {2014},
  howpublished = {Internal Memo}
}

@article{entry_article_modern,
  author = {Quinn Parker},
  title = {Modern Approaches to Layout Analysis},
  journal = {International Journal of OCR},
  year = {2020},
  volume = {7},
  number = {1}
}

@book{entry_book_distributed,
  author = {Rina Haddad},
  title = {Distributed Text Processing},
  publisher = {Northern Lights},
  year = {2002}
}

@inproceedings{entry_inproceedings_reproducibility,
  author = {Samuel Ortega},
  title = {Reproducible Extraction Pipelines},
  booktitle = {Workshop on Reliable NLP},
  year = {2013},
  pages = {12-20}
}

@article{entry_article_architecture,
  author = {Talia Cohen},
  title = {Architecture Patterns for Extractors},
  journal = {Systems Journal},
  year = {2008}
}

@techreport{entry_techreport_innovation,
  author = {Umar Farouk},
  title = {Innovation in Document Processing},
  institution = {Global Research Institute},
  year = {2006}
}

@booklet{entry_booklet_research,
  author = {Valeria Costa},
  title = {Research Highlights in OCR},
  year = {1998},
  note = {Conference supplement}
}

@article{entry_article_future,
  author = {Wei Zhang},
  title = {Future of Unified Extraction},
  journal = {Journal of Pipeline Research},
  year = {2024}
}
